#include <torch/extension.h>
#include "cuda/kernel.h"  // 包含 CUDA 头文件

PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
    m.def("add_cuda", &add_cuda, "Element-wise addition (CUDA)");
}